from .transformer import GPT2ParallelTransformer
from .gpt2_modeling import gpt2_get_params_for_weight_decay_optimization